/*
 * Copyright 2008 Carnegie Mellon University
 * Licensed under the Apache License, Version 2.0 (the "License"); 
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *  
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, 
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied. See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */
package edu.cmu.lti.sepia.task.retrieval.indri;

public class IndriUtil {

  /**
   * Returns an array of query terms from the specified Indri query.
   * 
   * @param indriQuery
   * @return an array of query terms
   */
  public static String[] getQueryTerms(String indriQuery) {
    String q = indriQuery.replaceAll(" ", "");
    q = q.replaceAll("\"", " ");
    q = q.replaceAll("#.*?\\(", "(");
    q = q.replaceAll("\\(|\\)", " ");
    q = q.replaceAll("(^[ ]+)|([ ]+$)", "");
    q = q.replaceAll("\\..+", "");  // For a field parameter
    String[] queryTerms = q.split("\\s+");
    // System.out.println("Query: "+java.util.Arrays.toString(queryTerms));

    return queryTerms;
  }

}
